@article{main,
  title={Exploration in interactive personalized music recommendation: a reinforcement learning approach},
  author={Wang, Xinxi and Wang, Yi and Hsu, David and Wang, Ye},
  journal={ACM Transactions on Multimedia Computing, Communications, and Applications (TOMM)},
  volume={11},
  number={1},
  pages={7},
  year={2014},
  publisher={ACM}
}

@book{sutton1998reinforcement,
  title={Reinforcement learning: An introduction},
  author={Sutton, Richard S and Barto, Andrew G},
  volume={1},
  number={1},
  year={1998},
  publisher={MIT press Cambridge}
}

@article{algoandmethodsinrecommender,
  title={Algorithms and methods in recommender systems},
  author={Asanov, Daniar},
  journal={Berlin Institute of Technology, Berlin, Germany},
  year={2011}
}

@article{ebbinghaus1913memory,
  title={Memory: A Contribution to Experimental Psychology, translated by Henry A},
  author={Ebbinghaus, Hermann},
  journal={Ruger \& Clara E. Bussenius. New York: Teachers College, Columbia University},
  year={1913}
}


@book{principalcompanalysis,
  title={Principal component analysis},
  author={Jolliffe, Ian},
  year={2002},
  publisher={Wiley Online Library}
}

@book{recommendersystemhandbook,
  title={Introduction to recommender systems handbook},
  author={Ricci, Francesco and Rokach, Lior and Shapira, Bracha},
  year={2011},
  publisher={Springer}
}

@article{netflix-article-recommender,
 author = {Gomez-Uribe, Carlos A. and Hunt, Neil},
 title = {The Netflix Recommender System: Algorithms, Business Value, and Innovation},
 journal = {ACM Trans. Manage. Inf. Syst.},
 issue_date = {January 2016},
 volume = {6},
 number = {4},
 month = dec,
 year = {2015},
 issn = {2158-656X},
 pages = {13:1--13:19},
 articleno = {13},
 numpages = {19},
 url = {http://doi.acm.org/10.1145/2843948},
 doi = {10.1145/2843948},
 acmid = {2843948},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {Recommender systems},
}


@inproceedings{li2010contextual,
  title={A contextual-bandit approach to personalized news article recommendation},
  author={Li, Lihong and Chu, Wei and Langford, John and Schapire, Robert E},
  booktitle={Proceedings of the 19th international conference on World wide web},
  pages={661--670},
  year={2010},
  organization={ACM}
}

@inproceedings{lu2010contextual,
  title={Contextual Multi-Armed Bandits.},
  author={Lu, Tyler and P{\'a}l, D{\'a}vid and P{\'a}l, Martin},
  booktitle={AISTATS},
  pages={485--492},
  year={2010}
}

@article{kuleshov2014algorithms,
  title={Algorithms for multi-armed bandit problems},
  author={Kuleshov, Volodymyr and Precup, Doina},
  journal={arXiv preprint arXiv:1402.6028},
  year={2014}
}

@inproceedings{cesa1998finite,
  title={Finite-Time Regret Bounds for the Multiarmed Bandit Problem.},
  author={Cesa-Bianchi, Nicol{\`o} and Fischer, Paul},
  booktitle={ICML},
  pages={100--108},
  year={1998},
  organization={Citeseer}
}


@inproceedings{vermorel2005multi,
  title={Multi-armed bandit algorithms and empirical evaluation},
  author={Vermorel, Joannes and Mohri, Mehryar},
  booktitle={European conference on machine learning},
  pages={437--448},
  year={2005},
  organization={Springer}
}
